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#include 
#include 
#include 
#include 
#include 
# include 
#include 
# include 
#include 



<stdio.h> 
<unist"d . h> 
<errno.h> 
<stdlib .h> 



<sys/ types ,h> 
<sys/stat .h> 



<fcntl .h> 
<string . h> 
"fastdb.h" 



int FalseDigs = 0; 
int LinksFol lowed = 0; 




#ifndef GET_DIRECT 

int QueryRecord ( char *key, char *record ) 



int i ; 

unsigned short crc; 
unsigned short crcl6; 
unsigned long startoff; 
unsigned long curpos; 
•int bytes; 
char *ptr; 

keyindx_t crcbucket [CRCBUCKETSIZE+1] ; 
keyindx_t *keyptr; 
static int keyfd = -1; 
static int datafd = -1; 

// first time file open of keyindx and data file 
if ( keyfd == -1 ) 

. ( 

// open the key index file 

keyfd = open ( "keyindx" , 0_RD0NLY ); 

if ( keyfd == -1 ) 



printf ( "Can't open keyindx for write. %s\n", 

strerror ( errno ) ) ; 
exit (1) ; 



// open the Data file 

datafd = open ( "Data", O RDONLY ); 
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if ( datafd == -1) 
{ 

printf ( "Can't open Data for read. %s\n" , 

strerror ( errno ) ) ; 
close ( keyfd ) ; 
keyfd = -1; 
exit (1) ; 
} 

} 

// calculate CRC-CCITT checksum 

crcstr ( &crc, (unsigned char *) key ) ; 

#ifndef SIMPLE_HASH 

// calculate CRC-16 checksum 

crcl6str ( &crcl6, (unsigned char *) key ) ; 
tfendif 

// find right bucket 

startoff = (unsigned long) crc * (CRCBUCKETSIZE + 1) * sizeof (keyindx_t) 

while ( 1 ) 
{ 

// seek to this bucket's offset 

curpos = Iseek { keyfd, startoff, SEEK_SET ); 

if ( curpos != startoff ) 

{ 

printf ( "Iseek in keyindx file failed\n" ) ; 
exit (1) ; 

} 



// read the bucket 

if ( read ( keyfd, (char *) crcbucket, sizeof (crcbucket) ) 
!= sizeof (crcbucket) ) 

{ 

printf ( "read from keyindx file failed\n" ) ; 

exit (1) ,- 

} 

// search for crcl6 match 
keyptr = crcbucket; 

for ( i = 0; i < CRCBUCKETSIZE / i++, keyptr++ ) 
{ 

#ifndef SIMPLE_HASH 

// check for crcl6 match slot in bucket 

if ( keyptr->crcl6 == crcl6 && keyptr->of f set != MAXOFFSET ) 

#else 

// simulating simple hash, ignoring crcl6 value... 
if ( keyptr->of fset MAXOFFSET ) 

#endif 

{ 

// found match, read record for key verification... 
curpos = Iseek ( datafd, keyptr->of f set , SEEK_SET ); 
if ( curpos != keyptr->of f set ) 
{ 

printf ( "Iseek in Data file failed\n" ) ; 
exit (1) ; 
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bytes = read ( datafd, record, MAXRECORD - 1 ) ; 
if ( bytes < 2 ) 

{ 

printf ( "bad read, bytes = %d\n", 

bytes ) ; 
exit (1) ; 

} 

record [bytes] = 0; 
ptr = strchr ( record, '\n' ) ,- 
if ( !ptr ) 
{ 

printf ( "error, no new line found\n" ) ; 
exit (1) ; 

} 

*ptr = 0; 

// get first field, e-mail key is first 
ptr = strchr ( record, ' \t ' ) ; 
if ( !ptr ) 

.=1 printf ( "bad read, no tab found\n" ) ; 

C§ exit(l); 

M. } 

2 II check record (key is first record) 

*p tr = 0 '* 

;:!! if ( strcmp ( record, key ) == 0 ) 

m { 

;•' // found record 

*ptr = ' \t ■ ; 
I'" return 1 ; 

2 } 

else 

t3 { . . 

//printf ( "false dig, found: ^s'Xn", 

//record ) ; 
FalseDigs++ ; 

} 

} 



// no macth found in this bucket, check if next crcbucket is linked, 
if ( keyptr->offset == MAXOFFSET ) 

break; // no more buckets, record not found 

// follow link to next bucket... 
startoff = keyptr->of f set ; 
Links Fol lowed+ + ; 

//printf ( "Linking to next bucket at 0x%x\n" , startoff ); 
} // while ( 1 ) 



// record not found 

printf ( "record not found, key 

return ( 0 ) ; 



%s\n», key ) ; 
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} 

ttelse 
// 

// Name : Que ryRe cord 
// 

// Description: 

// Query record routine using theoritical optimal solution. 

// Does not use index file, rather it transform the search 

// key into record offset via computation. Basically, 

// provides baseline performance for random seeks/reads 

// on a large data file. 

// 

int QueryRecord ( char *key, char * record ) 

{ 

int i ; 

unsigned long startoff ,- 
unsigned long curpos; 
unsigned int rindex; 
int bytes; 
char *ptr; 

static int datafd = -1; 

// first time file open of keyindx and data file 
if ( datafd == -1 ) 
{ 

// open the Data file 
datafd = open ( "Data", 0_RDONLY ); 
if ( datafd == -1) 
{ 

printf ( "Can't open Data for read. %s\n" , 

strerror ( errno ) ) ; 
exit (1) ; 
} 

} 

// translate key into record number 
sscanf ( key, "%x", fcrindex ) ; 
startoff = {unsigned long) rindex * 100; 

// seek directly to record and read it 

curpos = lseek ( datafd, startoff, SEEK_SET ) ; 

if ( curpos != startoff ) 

{ 

printf ( "lseek in Data file failed\n" ) ; 
exit (1) ; 

} 

bytes = read ( datafd, record, MAXRECORD - 1 ) ; 
if ( bytes < 2 ) 
{ 

printf ( "bad read, bytes = %d\n", 

bytes ) ; 
exit (1) ; 

} 
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record [bytes] = 0; 
ptr = strchr ( record, ' \n' ); 
if ( !ptr ) 
{ 

printf ( "error, no new line found\n" 
exit (1) ; 

} 

*ptr = 0; 

// -get first field, e-mail key is first 
ptr = strchr ( record, ' \t 1 ); 
if ( !ptr ) 
{ 

printf ( "bad read, no tab found\n" ) ; 

exit (1) ; 

} 

// check record (key is first record) 
*ptr = 0/ 

if ( strcmp ( record, key ) == 0 ) 

{ 

// found record 
*ptr = ' \t ' ; 
return 1 ; 

} 

else 

{ 

printf ( "false dig, found: ' %s'\n", 

record ) ; 
FalseDigs++ ; 

} 

/ / record not found 

printf ( "record not found, key = %s\n", key ) 
return ( 0 ) ; 

} 

#endif // GET DIRECT solution 



